﻿using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using System.Text.RegularExpressions;

namespace Spider.Parser
{
    public class BaixingParser : ParserBase
    {
        protected override string GetContext(string html)
        {
            string reg = @"(?is)(?<=<p>).+?(?=</p>)";
            string temp = Regex.Match(html, reg).Value;
            //移除标签中的内容 只要纯文本
            return Regex.Replace(temp, @"<[^>]*>", string.Empty, RegexOptions.IgnoreCase);
        }
    }
}
